From bb974604147a1ee43ef0800981ddef8d36c31a51 Mon Sep 17 00:00:00 2001 From: oliskoli Date: Wed, 4 Jul 2007 20:40:45 +0000 Subject: [PATCH] Extend extra UCS4 to character conversion table. --- gpsbabel/cet/ansi_x3_4_1968.h | 580 +++++++++++++++++++++++----------- 1 file changed, 388 insertions(+), 192 deletions(-) diff --git a/gpsbabel/cet/ansi_x3_4_1968.h b/gpsbabel/cet/ansi_x3_4_1968.h index 700c091b7..f8ce866aa 100644 --- a/gpsbabel/cet/ansi_x3_4_1968.h +++ b/gpsbabel/cet/ansi_x3_4_1968.h @@ -50,196 +50,392 @@ const cet_ucs4_link_t cet_ucs4_to_ansi_x3_4_1968_extra[] = /* !!! sorted by UCS-4 value !!! */ /* ------------------------------------------*/ { - {0x00c0, (unsigned char) 'A'}, // latin capital letter a with grave - {0x00c1, (unsigned char) 'A'}, // latin capital letter a with acute - {0x00C2, (unsigned char) 'A'}, // latin capital letter a with circumflex - {0x00C3, (unsigned char) 'A'}, // latin capital letter a with tilde - {0x00C4, (unsigned char) 'A'}, // latin capital letter a with diaeresis - {0x00C5, (unsigned char) 'A'}, // latin capital letter a with ring above - {0x00C7, (unsigned char) 'C'}, // latin capital letter c with cedilla - {0x00C8, (unsigned char) 'E'}, // latin capital letter e with grave - {0x00C9, (unsigned char) 'E'}, // latin capital letter e with acute - {0x00CA, (unsigned char) 'E'}, // latin capital letter e with circumflex - {0x00CB, (unsigned char) 'E'}, // latin capital letter e with diaeresis - {0x00CC, (unsigned char) 'I'}, // latin capital letter i with grave - {0x00CD, (unsigned char) 'I'}, // latin capital letter i with acute - {0x00CE, (unsigned char) 'I'}, // latin capital letter i with circumflex - {0x00CF, (unsigned char) 'I'}, // latin capital letter i with diaeresis - {0x00D1, (unsigned char) 'N'}, // latin capital letter n with tilde - {0x00D2, (unsigned char) 'O'}, // latin capital letter o with grave - {0x00D3, (unsigned char) 'O'}, // latin capital letter o with acute - {0x00D4, (unsigned char) 'O'}, // latin capital letter o with circumflex - {0x00D5, (unsigned char) 'O'}, // latin capital letter o with tilde - {0x00D6, (unsigned char) 'O'}, // latin capital letter o with diaeresis - {0x00D8, (unsigned char) 'O'}, // latin capital letter o with stroke - {0x00D9, (unsigned char) 'U'}, // latin capital letter u with grave - {0x00DA, (unsigned char) 'U'}, // latin capital letter u with acute - {0x00DB, (unsigned char) 'U'}, // latin capital letter u with circumflex - {0x00DC, (unsigned char) 'U'}, // latin capital letter u with diaeresis - {0x00DD, (unsigned char) 'Y'}, // latin capital letter y with acute - {0x00E0, (unsigned char) 'a'}, // latin small letter a with grave - {0x00E1, (unsigned char) 'a'}, // latin small letter a with acute - {0x00E2, (unsigned char) 'a'}, // latin small letter a with circumflex - {0x00E3, (unsigned char) 'a'}, // latin small letter a with tilde - {0x00E4, (unsigned char) 'a'}, // latin small letter a with diaeresis - {0x00E5, (unsigned char) 'a'}, // latin small letter a with ring above - {0x00E7, (unsigned char) 'c'}, // latin small letter c with cedilla - {0x00E8, (unsigned char) 'e'}, // latin small letter e with grave - {0x00E9, (unsigned char) 'e'}, // latin small letter e with acute - {0x00EA, (unsigned char) 'e'}, // latin small letter e with circumflex - {0x00EB, (unsigned char) 'e'}, // latin small letter e with diaeresis - {0x00EC, (unsigned char) 'i'}, // latin small letter i with grave - {0x00ED, (unsigned char) 'i'}, // latin small letter i with acute - {0x00EE, (unsigned char) 'i'}, // latin small letter i with circumflex - {0x00EF, (unsigned char) 'i'}, // latin small letter i with diaeresis - {0x00F1, (unsigned char) 'n'}, // latin small letter n with tilde - {0x00F2, (unsigned char) 'o'}, // latin small letter o with grave - {0x00F3, (unsigned char) 'o'}, // latin small letter o with acute - {0x00F4, (unsigned char) 'o'}, // latin small letter o with circumflex - {0x00F5, (unsigned char) 'o'}, // latin small letter o with tilde - {0x00F6, (unsigned char) 'o'}, // latin small letter o with diaeresis - {0x00F8, (unsigned char) 'o'}, // latin small letter o with stroke - {0x00F9, (unsigned char) 'u'}, // latin small letter u with grave - {0x00FA, (unsigned char) 'u'}, // latin small letter u with acute - {0x00FB, (unsigned char) 'u'}, // latin small letter u with circumflex - {0x00FC, (unsigned char) 'u'}, // latin small letter u with diaeresis - {0x00FD, (unsigned char) 'y'}, // latin small letter y with acute - {0x00FF, (unsigned char) 'y'}, // latin small letter y with diaeresis - {0x0100, (unsigned char) 'A'}, // latin capital letter a with macron - {0x0101, (unsigned char) 'a'}, // latin small letter a with macron - {0x0102, (unsigned char) 'A'}, // latin capital letter a with breve - {0x0103, (unsigned char) 'a'}, // latin small letter a with breve - {0x0104, (unsigned char) 'A'}, // latin capital letter a with ogonek - {0x0105, (unsigned char) 'a'}, // latin small letter a with ogonek - {0x0106, (unsigned char) 'C'}, // latin capital letter c with acute - {0x0107, (unsigned char) 'c'}, // latin small letter c with acute - {0x0108, (unsigned char) 'C'}, // latin capital letter c with circumflex - {0x0109, (unsigned char) 'c'}, // latin small letter c with circumflex - {0x010A, (unsigned char) 'C'}, // latin capital letter c with dot above - {0x010B, (unsigned char) 'c'}, // latin small letter c with dot above - {0x010C, (unsigned char) 'C'}, // latin capital letter c with caron - {0x010D, (unsigned char) 'c'}, // latin small letter c with caron - {0x010E, (unsigned char) 'D'}, // latin capital letter d with caron - {0x010F, (unsigned char) 'd'}, // latin small letter d with caron - {0x0110, (unsigned char) 'D'}, // latin capital letter d with stroke - {0x0111, (unsigned char) 'd'}, // latin small letter d with stroke - {0x0112, (unsigned char) 'E'}, // latin capital letter e with macron - {0x0113, (unsigned char) 'e'}, // latin small letter e with macron - {0x0116, (unsigned char) 'E'}, // latin capital letter e with dot above - {0x0117, (unsigned char) 'e'}, // latin small letter e with dot above - {0x0118, (unsigned char) 'E'}, // latin capital letter e with ogonek - {0x0119, (unsigned char) 'e'}, // latin small letter e with ogonek - {0x011A, (unsigned char) 'E'}, // latin capital letter e with caron - {0x011B, (unsigned char) 'e'}, // latin small letter e with caron - {0x011C, (unsigned char) 'G'}, // latin capital letter g with circumflex - {0x011D, (unsigned char) 'g'}, // latin small letter g with circumflex - {0x011E, (unsigned char) 'G'}, // latin capital letter g with breve - {0x011F, (unsigned char) 'g'}, // latin small letter g with breve - {0x0120, (unsigned char) 'G'}, // latin capital letter g with dot above - {0x0121, (unsigned char) 'g'}, // latin small letter g with dot above - {0x0122, (unsigned char) 'G'}, // latin capital letter g with cedilla - {0x0123, (unsigned char) 'g'}, // latin small letter g with cedilla - {0x0124, (unsigned char) 'H'}, // latin capital letter h with circumflex - {0x0125, (unsigned char) 'h'}, // latin small letter h with circumflex - {0x0126, (unsigned char) 'H'}, // latin capital letter h with stroke - {0x0127, (unsigned char) 'h'}, // latin small letter h with stroke - {0x0128, (unsigned char) 'I'}, // latin capital letter i with tilde - {0x0129, (unsigned char) 'i'}, // latin small letter i with tilde - {0x012A, (unsigned char) 'I'}, // latin capital letter i with macron - {0x012B, (unsigned char) 'i'}, // latin small letter i with macron - {0x012E, (unsigned char) 'I'}, // latin capital letter i with ogonek - {0x012F, (unsigned char) 'i'}, // latin small letter i with ogonek - {0x0130, (unsigned char) 'I'}, // latin capital letter i with dot above - {0x0134, (unsigned char) 'J'}, // latin capital letter j with circumflex - {0x0135, (unsigned char) 'j'}, // latin small letter j with circumflex - {0x0136, (unsigned char) 'K'}, // latin capital letter k with cedilla - {0x0137, (unsigned char) 'k'}, // latin small letter k with cedilla - {0x0139, (unsigned char) 'L'}, // latin capital letter l with acute - {0x013A, (unsigned char) 'l'}, // latin small letter l with acute - {0x013B, (unsigned char) 'L'}, // latin capital letter l with cedilla - {0x013C, (unsigned char) 'l'}, // latin small letter l with cedilla - {0x013D, (unsigned char) 'L'}, // latin capital letter l with caron - {0x013E, (unsigned char) 'l'}, // latin small letter l with caron - {0x0141, (unsigned char) 'L'}, // latin capital letter l with stroke - {0x0142, (unsigned char) 'l'}, // latin small letter l with stroke - {0x0143, (unsigned char) 'N'}, // latin capital letter n with acute - {0x0144, (unsigned char) 'n'}, // latin small letter n with acute - {0x0145, (unsigned char) 'N'}, // latin capital letter n with cedilla - {0x0146, (unsigned char) 'n'}, // latin small letter n with cedilla - {0x0147, (unsigned char) 'N'}, // latin capital letter n with caron - {0x0148, (unsigned char) 'n'}, // latin small letter n with caron - {0x014C, (unsigned char) 'O'}, // latin capital letter o with macron - {0x014D, (unsigned char) 'o'}, // latin small letter o with macron - {0x0150, (unsigned char) 'O'}, // latin capital letter o with double acute - {0x0151, (unsigned char) 'o'}, // latin small letter o with double acute - {0x0154, (unsigned char) 'R'}, // latin capital letter r with acute - {0x0155, (unsigned char) 'r'}, // latin small letter r with acute - {0x0156, (unsigned char) 'R'}, // latin capital letter r with cedilla - {0x0157, (unsigned char) 'r'}, // latin small letter r with cedilla - {0x0158, (unsigned char) 'R'}, // latin capital letter r with caron - {0x0159, (unsigned char) 'r'}, // latin small letter r with caron - {0x015A, (unsigned char) 'S'}, // latin capital letter s with acute - {0x015B, (unsigned char) 's'}, // latin small letter s with acute - {0x015C, (unsigned char) 'S'}, // latin capital letter s with circumflex - {0x015D, (unsigned char) 's'}, // latin small letter s with circumflex - {0x015E, (unsigned char) 'S'}, // latin capital letter s with cedilla - {0x015F, (unsigned char) 's'}, // latin small letter s with cedilla - {0x0160, (unsigned char) 'S'}, // latin capital letter s with caron - {0x0161, (unsigned char) 's'}, // latin small letter s with caron - {0x0162, (unsigned char) 'T'}, // latin capital letter t with cedilla - {0x0163, (unsigned char) 't'}, // latin small letter t with cedilla - {0x0164, (unsigned char) 'T'}, // latin capital letter t with caron - {0x0165, (unsigned char) 't'}, // latin small letter t with caron - {0x0166, (unsigned char) 'T'}, // latin capital letter t with stroke - {0x0167, (unsigned char) 't'}, // latin small letter t with stroke - {0x0168, (unsigned char) 'U'}, // latin capital letter u with tilde - {0x0169, (unsigned char) 'u'}, // latin small letter u with tilde - {0x016A, (unsigned char) 'U'}, // latin capital letter u with macron - {0x016B, (unsigned char) 'u'}, // latin small letter u with macron - {0x016C, (unsigned char) 'U'}, // latin capital letter u with breve - {0x016D, (unsigned char) 'u'}, // latin small letter u with breve - {0x016E, (unsigned char) 'U'}, // latin capital letter u with ring above - {0x016F, (unsigned char) 'u'}, // latin small letter u with ring above - {0x0170, (unsigned char) 'U'}, // latin capital letter u with double acute - {0x0171, (unsigned char) 'u'}, // latin small letter u with double acute - {0x0172, (unsigned char) 'U'}, // latin capital letter u with ogonek - {0x0173, (unsigned char) 'u'}, // latin small letter u with ogonek - {0x0174, (unsigned char) 'W'}, // latin capital letter w with circumflex - {0x0175, (unsigned char) 'w'}, // latin small letter w with circumflex - {0x0176, (unsigned char) 'Y'}, // latin capital letter y with circumflex - {0x0177, (unsigned char) 'y'}, // latin small letter y with circumflex - {0x0178, (unsigned char) 'Y'}, // latin capital letter y with diaeresis - {0x0179, (unsigned char) 'Z'}, // latin capital letter z with acute - {0x017A, (unsigned char) 'z'}, // latin small letter z with acute - {0x017B, (unsigned char) 'Z'}, // latin capital letter z with dot above - {0x017C, (unsigned char) 'z'}, // latin small letter z with dot above - {0x017D, (unsigned char) 'Z'}, // latin capital letter z with caron - {0x017E, (unsigned char) 'z'}, // latin small letter z with caron - {0x1E02, (unsigned char) 'B'}, // latin capital letter b with dot above - {0x1E03, (unsigned char) 'b'}, // latin small letter b with dot above - {0x1E0A, (unsigned char) 'D'}, // latin capital letter d with dot above - {0x1E0B, (unsigned char) 'd'}, // latin small letter d with dot above - {0x1E1E, (unsigned char) 'F'}, // latin capital letter f with dot above - {0x1E1F, (unsigned char) 'f'}, // latin small letter f with dot above - {0x1E40, (unsigned char) 'M'}, // latin capital letter m with dot above - {0x1E41, (unsigned char) 'm'}, // latin small letter m with dot above - {0x1E56, (unsigned char) 'P'}, // latin capital letter p with dot above - {0x1E57, (unsigned char) 'p'}, // latin small letter p with dot above - {0x1E60, (unsigned char) 'S'}, // latin capital letter s with dot above - {0x1E61, (unsigned char) 's'}, // latin small letter s with dot above - {0x1E6A, (unsigned char) 'T'}, // latin capital letter t with dot above - {0x1E6B, (unsigned char) 't'}, // latin small letter t with dot above - {0x1E80, (unsigned char) 'W'}, // latin capital letter w with grave - {0x1E81, (unsigned char) 'w'}, // latin small letter w with grave - {0x1E82, (unsigned char) 'W'}, // latin capital letter w with acute - {0x1E83, (unsigned char) 'w'}, // latin small letter w with acute - {0x1E84, (unsigned char) 'W'}, // latin capital letter w with diaeresis - {0x1E85, (unsigned char) 'w'}, // latin small letter w with diaeresis - {0x1e94, (unsigned char) 'u'}, - {0x1EF2, (unsigned char) 'Y'}, // latin capital letter y with grave - {0x1EF3, (unsigned char) 'y'}, // latin small letter y with grave - {0x201c, (unsigned char) '"'}, - {0x201d, (unsigned char) '"'} + {0x00C0, (unsigned char) 'A'}, // latin capital letter a with grave + {0x00C1, (unsigned char) 'A'}, // latin capital letter a with acute + {0x00C2, (unsigned char) 'A'}, // latin capital letter a with circumflex + {0x00C3, (unsigned char) 'A'}, // latin capital letter a with tilde + {0x00C4, (unsigned char) 'A'}, // latin capital letter a with diaeresis + {0x00C5, (unsigned char) 'A'}, // latin capital letter a with ring above + {0x00C7, (unsigned char) 'C'}, // latin capital letter c with cedilla + {0x00C8, (unsigned char) 'E'}, // latin capital letter e with grave + {0x00C9, (unsigned char) 'E'}, // latin capital letter e with acute + {0x00CA, (unsigned char) 'E'}, // latin capital letter e with circumflex + {0x00CB, (unsigned char) 'E'}, // latin capital letter e with diaeresis + {0x00CC, (unsigned char) 'I'}, // latin capital letter i with grave + {0x00CD, (unsigned char) 'I'}, // latin capital letter i with acute + {0x00CE, (unsigned char) 'I'}, // latin capital letter i with circumflex + {0x00CF, (unsigned char) 'I'}, // latin capital letter i with diaeresis + {0x00D1, (unsigned char) 'N'}, // latin capital letter n with tilde + {0x00D2, (unsigned char) 'O'}, // latin capital letter o with grave + {0x00D3, (unsigned char) 'O'}, // latin capital letter o with acute + {0x00D4, (unsigned char) 'O'}, // latin capital letter o with circumflex + {0x00D5, (unsigned char) 'O'}, // latin capital letter o with tilde + {0x00D6, (unsigned char) 'O'}, // latin capital letter o with diaeresis + {0x00D8, (unsigned char) 'O'}, // latin capital letter o with stroke + {0x00D9, (unsigned char) 'U'}, // latin capital letter u with grave + {0x00DA, (unsigned char) 'U'}, // latin capital letter u with acute + {0x00DB, (unsigned char) 'U'}, // latin capital letter u with circumflex + {0x00DC, (unsigned char) 'U'}, // latin capital letter u with diaeresis + {0x00DD, (unsigned char) 'Y'}, // latin capital letter y with acute + {0x00E0, (unsigned char) 'a'}, // latin small letter a with grave + {0x00E1, (unsigned char) 'a'}, // latin small letter a with acute + {0x00E2, (unsigned char) 'a'}, // latin small letter a with circumflex + {0x00E3, (unsigned char) 'a'}, // latin small letter a with tilde + {0x00E4, (unsigned char) 'a'}, // latin small letter a with diaeresis + {0x00E5, (unsigned char) 'a'}, // latin small letter a with ring above + {0x00E7, (unsigned char) 'c'}, // latin small letter c with cedilla + {0x00E8, (unsigned char) 'e'}, // latin small letter e with grave + {0x00E9, (unsigned char) 'e'}, // latin small letter e with acute + {0x00EA, (unsigned char) 'e'}, // latin small letter e with circumflex + {0x00EB, (unsigned char) 'e'}, // latin small letter e with diaeresis + {0x00EC, (unsigned char) 'i'}, // latin small letter i with grave + {0x00ED, (unsigned char) 'i'}, // latin small letter i with acute + {0x00EE, (unsigned char) 'i'}, // latin small letter i with circumflex + {0x00EF, (unsigned char) 'i'}, // latin small letter i with diaeresis + {0x00F1, (unsigned char) 'n'}, // latin small letter n with tilde + {0x00F2, (unsigned char) 'o'}, // latin small letter o with grave + {0x00F3, (unsigned char) 'o'}, // latin small letter o with acute + {0x00F4, (unsigned char) 'o'}, // latin small letter o with circumflex + {0x00F5, (unsigned char) 'o'}, // latin small letter o with tilde + {0x00F6, (unsigned char) 'o'}, // latin small letter o with diaeresis + {0x00F8, (unsigned char) 'o'}, // latin small letter o with stroke + {0x00F9, (unsigned char) 'u'}, // latin small letter u with grave + {0x00FA, (unsigned char) 'u'}, // latin small letter u with acute + {0x00FB, (unsigned char) 'u'}, // latin small letter u with circumflex + {0x00FC, (unsigned char) 'u'}, // latin small letter u with diaeresis + {0x00FD, (unsigned char) 'y'}, // latin small letter y with acute + {0x00FF, (unsigned char) 'y'}, // latin small letter y with diaeresis + {0x0100, (unsigned char) 'A'}, // latin capital letter a with macron + {0x0101, (unsigned char) 'a'}, // latin small letter a with macron + {0x0102, (unsigned char) 'A'}, // latin capital letter a with breve + {0x0103, (unsigned char) 'a'}, // latin small letter a with breve + {0x0104, (unsigned char) 'A'}, // latin capital letter a with ogonek + {0x0105, (unsigned char) 'a'}, // latin small letter a with ogonek + {0x0106, (unsigned char) 'C'}, // latin capital letter c with acute + {0x0107, (unsigned char) 'c'}, // latin small letter c with acute + {0x0108, (unsigned char) 'C'}, // latin capital letter c with circumflex + {0x0109, (unsigned char) 'c'}, // latin small letter c with circumflex + {0x010A, (unsigned char) 'C'}, // latin capital letter c with dot above + {0x010B, (unsigned char) 'c'}, // latin small letter c with dot above + {0x010C, (unsigned char) 'C'}, // latin capital letter c with caron + {0x010D, (unsigned char) 'c'}, // latin small letter c with caron + {0x010E, (unsigned char) 'D'}, // latin capital letter d with caron + {0x010F, (unsigned char) 'd'}, // latin small letter d with caron + {0x0110, (unsigned char) 'D'}, // latin capital letter d with stroke + {0x0111, (unsigned char) 'd'}, // latin small letter d with stroke + {0x0112, (unsigned char) 'E'}, // latin capital letter e with macron + {0x0113, (unsigned char) 'e'}, // latin small letter e with macron + {0x0114, (unsigned char) 'E'}, // latin capital letter e with breve + {0x0115, (unsigned char) 'e'}, // latin small letter e with breve + {0x0116, (unsigned char) 'E'}, // latin capital letter e with dot above + {0x0117, (unsigned char) 'e'}, // latin small letter e with dot above + {0x0118, (unsigned char) 'E'}, // latin capital letter e with ogonek + {0x0119, (unsigned char) 'e'}, // latin small letter e with ogonek + {0x011A, (unsigned char) 'E'}, // latin capital letter e with caron + {0x011B, (unsigned char) 'e'}, // latin small letter e with caron + {0x011C, (unsigned char) 'G'}, // latin capital letter g with circumflex + {0x011D, (unsigned char) 'g'}, // latin small letter g with circumflex + {0x011E, (unsigned char) 'G'}, // latin capital letter g with breve + {0x011F, (unsigned char) 'g'}, // latin small letter g with breve + {0x0120, (unsigned char) 'G'}, // latin capital letter g with dot above + {0x0121, (unsigned char) 'g'}, // latin small letter g with dot above + {0x0122, (unsigned char) 'G'}, // latin capital letter g with cedilla + {0x0123, (unsigned char) 'g'}, // latin small letter g with cedilla + {0x0124, (unsigned char) 'H'}, // latin capital letter h with circumflex + {0x0125, (unsigned char) 'h'}, // latin small letter h with circumflex + {0x0126, (unsigned char) 'H'}, // latin capital letter h with stroke + {0x0127, (unsigned char) 'h'}, // latin small letter h with stroke + {0x0128, (unsigned char) 'I'}, // latin capital letter i with tilde + {0x0129, (unsigned char) 'i'}, // latin small letter i with tilde + {0x012A, (unsigned char) 'I'}, // latin capital letter i with macron + {0x012B, (unsigned char) 'i'}, // latin small letter i with macron + {0x012C, (unsigned char) 'I'}, // latin capital letter i with breve + {0x012D, (unsigned char) 'i'}, // latin small letter i with breve + {0x012E, (unsigned char) 'I'}, // latin capital letter i with ogonek + {0x012F, (unsigned char) 'i'}, // latin small letter i with ogonek + {0x0130, (unsigned char) 'I'}, // latin capital letter i with dot above + {0x0131, (unsigned char) 'i'}, // latin small letter dotless i + {0x0134, (unsigned char) 'J'}, // latin capital letter j with circumflex + {0x0135, (unsigned char) 'j'}, // latin small letter j with circumflex + {0x0136, (unsigned char) 'K'}, // latin capital letter k with cedilla + {0x0137, (unsigned char) 'k'}, // latin small letter k with cedilla + {0x0139, (unsigned char) 'L'}, // latin capital letter l with acute + {0x013A, (unsigned char) 'l'}, // latin small letter l with acute + {0x013B, (unsigned char) 'L'}, // latin capital letter l with cedilla + {0x013C, (unsigned char) 'l'}, // latin small letter l with cedilla + {0x013D, (unsigned char) 'L'}, // latin capital letter l with caron + {0x013E, (unsigned char) 'l'}, // latin small letter l with caron + {0x0141, (unsigned char) 'L'}, // latin capital letter l with stroke + {0x0142, (unsigned char) 'l'}, // latin small letter l with stroke + {0x0143, (unsigned char) 'N'}, // latin capital letter n with acute + {0x0144, (unsigned char) 'n'}, // latin small letter n with acute + {0x0145, (unsigned char) 'N'}, // latin capital letter n with cedilla + {0x0146, (unsigned char) 'n'}, // latin small letter n with cedilla + {0x0147, (unsigned char) 'N'}, // latin capital letter n with caron + {0x0148, (unsigned char) 'n'}, // latin small letter n with caron + {0x014C, (unsigned char) 'O'}, // latin capital letter o with macron + {0x014D, (unsigned char) 'o'}, // latin small letter o with macron + {0x014E, (unsigned char) 'O'}, // latin capital letter o with breve + {0x014F, (unsigned char) 'o'}, // latin small letter o with breve + {0x0150, (unsigned char) 'O'}, // latin capital letter o with double acute + {0x0151, (unsigned char) 'o'}, // latin small letter o with double acute + {0x0152, (unsigned char) 'O'}, // latin capital ligature oe + {0x0153, (unsigned char) 'o'}, // latin small ligature oe + {0x0154, (unsigned char) 'R'}, // latin capital letter r with acute + {0x0155, (unsigned char) 'r'}, // latin small letter r with acute + {0x0156, (unsigned char) 'R'}, // latin capital letter r with cedilla + {0x0157, (unsigned char) 'r'}, // latin small letter r with cedilla + {0x0158, (unsigned char) 'R'}, // latin capital letter r with caron + {0x0159, (unsigned char) 'r'}, // latin small letter r with caron + {0x015A, (unsigned char) 'S'}, // latin capital letter s with acute + {0x015B, (unsigned char) 's'}, // latin small letter s with acute + {0x015C, (unsigned char) 'S'}, // latin capital letter s with circumflex + {0x015D, (unsigned char) 's'}, // latin small letter s with circumflex + {0x015E, (unsigned char) 'S'}, // latin capital letter s with cedilla + {0x015F, (unsigned char) 's'}, // latin small letter s with cedilla + {0x0160, (unsigned char) 'S'}, // latin capital letter s with caron + {0x0161, (unsigned char) 's'}, // latin small letter s with caron + {0x0162, (unsigned char) 'T'}, // latin capital letter t with cedilla + {0x0163, (unsigned char) 't'}, // latin small letter t with cedilla + {0x0164, (unsigned char) 'T'}, // latin capital letter t with caron + {0x0165, (unsigned char) 't'}, // latin small letter t with caron + {0x0166, (unsigned char) 'T'}, // latin capital letter t with stroke + {0x0167, (unsigned char) 't'}, // latin small letter t with stroke + {0x0168, (unsigned char) 'U'}, // latin capital letter u with tilde + {0x0169, (unsigned char) 'u'}, // latin small letter u with tilde + {0x016A, (unsigned char) 'U'}, // latin capital letter u with macron + {0x016B, (unsigned char) 'u'}, // latin small letter u with macron + {0x016C, (unsigned char) 'U'}, // latin capital letter u with breve + {0x016D, (unsigned char) 'u'}, // latin small letter u with breve + {0x016E, (unsigned char) 'U'}, // latin capital letter u with ring above + {0x016F, (unsigned char) 'u'}, // latin small letter u with ring above + {0x0170, (unsigned char) 'U'}, // latin capital letter u with double acute + {0x0171, (unsigned char) 'u'}, // latin small letter u with double acute + {0x0172, (unsigned char) 'U'}, // latin capital letter u with ogonek + {0x0173, (unsigned char) 'u'}, // latin small letter u with ogonek + {0x0174, (unsigned char) 'W'}, // latin capital letter w with circumflex + {0x0175, (unsigned char) 'w'}, // latin small letter w with circumflex + {0x0176, (unsigned char) 'Y'}, // latin capital letter y with circumflex + {0x0177, (unsigned char) 'y'}, // latin small letter y with circumflex + {0x0178, (unsigned char) 'Y'}, // latin capital letter y with diaeresis + {0x0179, (unsigned char) 'Z'}, // latin capital letter z with acute + {0x017A, (unsigned char) 'z'}, // latin small letter z with acute + {0x017B, (unsigned char) 'Z'}, // latin capital letter z with dot above + {0x017C, (unsigned char) 'z'}, // latin small letter z with dot above + {0x017D, (unsigned char) 'Z'}, // latin capital letter z with caron + {0x017E, (unsigned char) 'z'}, // latin small letter z with caron + {0x0180, (unsigned char) 'b'}, // latin small letter b with stroke + {0x0189, (unsigned char) 'D'}, // latin capital letter african d + {0x0191, (unsigned char) 'F'}, // latin capital letter f with hook + {0x0192, (unsigned char) 'f'}, // latin small letter f with hook + {0x0197, (unsigned char) 'I'}, // latin capital letter i with stroke + {0x019A, (unsigned char) 'l'}, // latin small letter l with bar + {0x019F, (unsigned char) 'O'}, // latin capital letter o with middle tilde + {0x01A0, (unsigned char) 'O'}, // latin capital letter o with horn + {0x01A1, (unsigned char) 'o'}, // latin small letter o with horn + {0x01AB, (unsigned char) 't'}, // latin small letter t with palatal hook + {0x01AE, (unsigned char) 'T'}, // latin capital letter t with retroflex hook + {0x01AF, (unsigned char) 'U'}, // latin capital letter u with horn + {0x01B0, (unsigned char) 'u'}, // latin small letter u with horn + {0x01B6, (unsigned char) 'z'}, // latin small letter z with stroke + {0x01C0, (unsigned char) '|'}, // latin letter dental click + {0x01C3, (unsigned char) '!'}, // latin letter retroflex click + {0x01CD, (unsigned char) 'A'}, // latin capital letter a with caron + {0x01CE, (unsigned char) 'a'}, // latin small letter a with caron + {0x01CF, (unsigned char) 'I'}, // latin capital letter i with caron + {0x01D0, (unsigned char) 'i'}, // latin small letter i with caron + {0x01D1, (unsigned char) 'O'}, // latin capital letter o with caron + {0x01D2, (unsigned char) 'o'}, // latin small letter o with caron + {0x01D3, (unsigned char) 'U'}, // latin capital letter u with caron + {0x01D4, (unsigned char) 'u'}, // latin small letter u with caron + {0x01D5, (unsigned char) 'U'}, // latin capital letter u with diaeresis and macron + {0x01D6, (unsigned char) 'u'}, // latin small letter u with diaeresis and macron + {0x01D7, (unsigned char) 'U'}, // latin capital letter u with diaeresis and acute + {0x01D8, (unsigned char) 'u'}, // latin small letter u with diaeresis and acute + {0x01D9, (unsigned char) 'U'}, // latin capital letter u with diaeresis and caron + {0x01DA, (unsigned char) 'u'}, // latin small letter u with diaeresis and caron + {0x01DB, (unsigned char) 'U'}, // latin capital letter u with diaeresis and grave + {0x01DC, (unsigned char) 'u'}, // latin small letter u with diaeresis and grave + {0x01DE, (unsigned char) 'A'}, // latin capital letter a with diaeresis and macron + {0x01DF, (unsigned char) 'a'}, // latin small letter a with diaeresis and macron + {0x01E4, (unsigned char) 'G'}, // latin capital letter g with stroke + {0x01E5, (unsigned char) 'g'}, // latin small letter g with stroke + {0x01E6, (unsigned char) 'G'}, // latin capital letter g with caron + {0x01E7, (unsigned char) 'g'}, // latin small letter g with caron + {0x01E8, (unsigned char) 'K'}, // latin capital letter k with caron + {0x01E9, (unsigned char) 'k'}, // latin small letter k with caron + {0x01EA, (unsigned char) 'O'}, // latin capital letter o with ogonek + {0x01EB, (unsigned char) 'o'}, // latin small letter o with ogonek + {0x01EC, (unsigned char) 'O'}, // latin capital letter o with ogonek and macron + {0x01ED, (unsigned char) 'o'}, // latin small letter o with ogonek and macron + {0x01F0, (unsigned char) 'j'}, // latin small letter j with caron + {0x0261, (unsigned char) 'g'}, // latin small letter script g + {0x02B9, (unsigned char) '\''}, // modifier letter prime + {0x02BA, (unsigned char) '"'}, // modifier letter double prime + {0x02BC, (unsigned char) '\''}, // modifier letter apostrophe + {0x02C4, (unsigned char) '^'}, // modifier letter up arrowhead + {0x02C6, (unsigned char) '^'}, // modifier letter circumflex accent + {0x02C7, (unsigned char) '^'}, // caron + {0x02C8, (unsigned char) '\''}, // modifier letter vertical line + {0x02CB, (unsigned char) '`'}, // modifier letter grave accent + {0x02CD, (unsigned char) '_'}, // modifier letter low macron + {0x02D8, (unsigned char) '^'}, // circumflex accent + {0x02D9, (unsigned char) '\''}, // dot above + {0x02DC, (unsigned char) '~'}, // small tilde + {0x0300, (unsigned char) '`'}, // combining grave accent + {0x0302, (unsigned char) '^'}, // combining circumflex accent + {0x0303, (unsigned char) '~'}, // combining tilde + {0x030E, (unsigned char) '"'}, // combining double vertical line above + {0x0331, (unsigned char) '_'}, // combining macron below + {0x0332, (unsigned char) '_'}, // combining low line + {0x037E, (unsigned char) ';'}, // greek question mark + {0x0393, (unsigned char) 'G'}, // greek capital letter gamma + {0x0398, (unsigned char) 'T'}, // greek capital letter theta + {0x03A3, (unsigned char) 'S'}, // greek capital letter sigma + {0x03A6, (unsigned char) 'F'}, // greek capital letter phi + {0x03A9, (unsigned char) 'O'}, // greek capital letter omega + {0x03B1, (unsigned char) 'a'}, // greek small letter alpha + {0x03B4, (unsigned char) 'd'}, // greek small letter delta + {0x03B5, (unsigned char) 'e'}, // greek small letter epsilon + {0x03C0, (unsigned char) 'p'}, // greek small letter pi + {0x03C3, (unsigned char) 's'}, // greek small letter sigma + {0x03C4, (unsigned char) 't'}, // greek small letter tau + {0x03C6, (unsigned char) 'f'}, // greek small letter phi + {0x04BB, (unsigned char) 'h'}, // cyrillic small letter shha + {0x0589, (unsigned char) ':'}, // armenian full stop + {0x066A, (unsigned char) '%'}, // arabic percent sign + {0x1E02, (unsigned char) 'B'}, // latin capital letter b with dot above + {0x1E03, (unsigned char) 'b'}, // latin small letter b with dot above + {0x1E0A, (unsigned char) 'D'}, // latin capital letter d with dot above + {0x1E0B, (unsigned char) 'd'}, // latin small letter d with dot above + {0x1E1E, (unsigned char) 'F'}, // latin capital letter f with dot above + {0x1E1F, (unsigned char) 'f'}, // latin small letter f with dot above + {0x1E40, (unsigned char) 'M'}, // latin capital letter m with dot above + {0x1E41, (unsigned char) 'm'}, // latin small letter m with dot above + {0x1E56, (unsigned char) 'P'}, // latin capital letter p with dot above + {0x1E57, (unsigned char) 'p'}, // latin small letter p with dot above + {0x1E60, (unsigned char) 'S'}, // latin capital letter s with dot above + {0x1E61, (unsigned char) 's'}, // latin small letter s with dot above + {0x1E6A, (unsigned char) 'T'}, // latin capital letter t with dot above + {0x1E6B, (unsigned char) 't'}, // latin small letter t with dot above + {0x1E80, (unsigned char) 'W'}, // latin capital letter w with grave + {0x1E81, (unsigned char) 'w'}, // latin small letter w with grave + {0x1E82, (unsigned char) 'W'}, // latin capital letter w with acute + {0x1E83, (unsigned char) 'w'}, // latin small letter w with acute + {0x1E84, (unsigned char) 'W'}, // latin capital letter w with diaeresis + {0x1E85, (unsigned char) 'w'}, // latin small letter w with diaeresis + {0x1E94, (unsigned char) 'u'}, + {0x1EF2, (unsigned char) 'Y'}, // latin capital letter y with grave + {0x1EF3, (unsigned char) 'y'}, // latin small letter y with grave + {0x2000, (unsigned char) ' '}, // en quad + {0x2001, (unsigned char) ' '}, // em quad + {0x2002, (unsigned char) ' '}, // en space + {0x2003, (unsigned char) ' '}, // em space + {0x2004, (unsigned char) ' '}, // three-per-em space + {0x2005, (unsigned char) ' '}, // four-per-em space + {0x2006, (unsigned char) ' '}, // six-per-em space + {0x2010, (unsigned char) '-'}, // hyphen + {0x2011, (unsigned char) '-'}, // non-breaking hyphen + {0x2017, (unsigned char) '='}, // double low line + {0x201C, (unsigned char) '"'}, + {0x201D, (unsigned char) '"'}, + {0x2032, (unsigned char) '\''}, // prime + {0x2035, (unsigned char) '`'}, // reversed prime + {0x203C, (unsigned char) '!'}, // double exclamation mark + {0x2044, (unsigned char) '/'}, // fraction slash + {0x2074, (unsigned char) '4'}, // superscript four + {0x2075, (unsigned char) '5'}, // superscript five + {0x2076, (unsigned char) '6'}, // superscript six + {0x2077, (unsigned char) '7'}, // superscript seven + {0x2078, (unsigned char) '8'}, // superscript eight + {0x207F, (unsigned char) 'n'}, // superscript latin small letter n + {0x2080, (unsigned char) '0'}, // subscript zero + {0x2081, (unsigned char) '1'}, // subscript one + {0x2082, (unsigned char) '2'}, // subscript two + {0x2083, (unsigned char) '3'}, // subscript three + {0x2084, (unsigned char) '4'}, // subscript four + {0x2085, (unsigned char) '5'}, // subscript five + {0x2086, (unsigned char) '6'}, // subscript six + {0x2087, (unsigned char) '7'}, // subscript seven + {0x2088, (unsigned char) '8'}, // subscript eight + {0x2089, (unsigned char) '9'}, // subscript nine + {0x20A7, (unsigned char) 'P'}, // peseta sign + {0x2102, (unsigned char) 'C'}, // double-struck capital c + {0x2107, (unsigned char) 'E'}, // euler constant + {0x210A, (unsigned char) 'g'}, // script small g + {0x210B, (unsigned char) 'H'}, // script capital h + {0x210C, (unsigned char) 'H'}, // black-letter capital h + {0x210D, (unsigned char) 'H'}, // double-struck capital h + {0x210E, (unsigned char) 'h'}, // planck constant + {0x2110, (unsigned char) 'I'}, // script capital i + {0x2111, (unsigned char) 'I'}, // black-letter capital i + {0x2112, (unsigned char) 'L'}, // script capital l + {0x2113, (unsigned char) 'l'}, // script small l + {0x2115, (unsigned char) 'N'}, // double-struck capital n + {0x2118, (unsigned char) 'P'}, // script capital p + {0x2119, (unsigned char) 'P'}, // double-struck capital p + {0x211A, (unsigned char) 'Q'}, // double-struck capital q + {0x211B, (unsigned char) 'R'}, // script capital r + {0x211C, (unsigned char) 'R'}, // black-letter capital r + {0x211D, (unsigned char) 'R'}, // double-struck capital r + {0x2124, (unsigned char) 'Z'}, // double-struck capital z + {0x2128, (unsigned char) 'Z'}, // black-letter capital z + {0x212A, (unsigned char) 'K'}, // kelvin sign + {0x212C, (unsigned char) 'B'}, // script capital b + {0x212D, (unsigned char) 'C'}, // black-letter capital c + {0x212E, (unsigned char) 'e'}, // estimated symbol + {0x212F, (unsigned char) 'e'}, // script small e + {0x2130, (unsigned char) 'E'}, // script capital e + {0x2131, (unsigned char) 'F'}, // script capital f + {0x2133, (unsigned char) 'M'}, // script capital m + {0x2134, (unsigned char) 'o'}, // script small o + {0x2190, (unsigned char) '<'}, // leftwards arrow + {0x2191, (unsigned char) '^'}, // upwards arrow + {0x2192, (unsigned char) '>'}, // rightwards arrow + {0x2193, (unsigned char) 'v'}, // downwards arrow + {0x2194, (unsigned char) '-'}, // left right arrow + {0x2195, (unsigned char) '|'}, // up down arrow + {0x21A8, (unsigned char) '|'}, // up down arrow with base + {0x2212, (unsigned char) '-'}, // minus sign + {0x2215, (unsigned char) '/'}, // division slash + {0x2216, (unsigned char) '\\'}, // set minus + {0x2217, (unsigned char) '*'}, // asterisk operator + {0x221A, (unsigned char) 'v'}, // square root + {0x221E, (unsigned char) '8'}, // infinity + {0x221F, (unsigned char) 'L'}, // right angle + {0x2223, (unsigned char) '|'}, // divides + {0x2229, (unsigned char) 'n'}, // intersection + {0x2236, (unsigned char) ':'}, // ratio + {0x223C, (unsigned char) '~'}, // tilde operator + {0x2261, (unsigned char) '='}, // identical to + {0x2264, (unsigned char) '='}, // less-than or equal to + {0x2265, (unsigned char) '='}, // greater-than or equal to + {0x2303, (unsigned char) '^'}, // up arrowhead + {0x2320, (unsigned char) '('}, // top half integral + {0x2321, (unsigned char) ')'}, // bottom half integral + {0x2329, (unsigned char) '<'}, // left-pointing angle bracket + {0x232A, (unsigned char) '>'}, // right-pointing angle bracket + {0x25AC, (unsigned char) '-'}, // black rectangle + {0x25B2, (unsigned char) '^'}, // black up-pointing triangle + {0x25BA, (unsigned char) '>'}, // black right-pointing pointer + {0x25C4, (unsigned char) '<'}, // black left-pointing pointer + {0x25CB, (unsigned char) '0'}, // white circle + {0x25D9, (unsigned char) '0'}, // inverse white circle + {0x263A, (unsigned char) 'O'}, // white smiling face + {0x263B, (unsigned char) 'O'}, // black smiling face + {0x263C, (unsigned char) '0'}, // white sun with rays + {0x2640, (unsigned char) '+'}, // female sign + {0x2642, (unsigned char) '>'}, // male sign + {0x266A, (unsigned char) 'd'}, // eighth note + {0x266B, (unsigned char) 'd'}, // beamed eighth notes + {0x2758, (unsigned char) '|'}, // light vertical bar + {0x3000, (unsigned char) ' '}, // ideographic space + {0x3008, (unsigned char) '<'}, // left angle bracket + {0x3009, (unsigned char) '>'}, // right angle bracket + {0x301A, (unsigned char) '['}, // left white square bracket + {0x301B, (unsigned char) ']'}, // right white square bracket + {0x301D, (unsigned char) '"'}, // reversed double prime quotation mark + {0x301E, (unsigned char) '"'} // double prime quotation mark }; cet_cs_vec_t cet_cs_vec_ansi_x3_4_1968 = /* defined in cet.h */ @@ -247,8 +443,8 @@ cet_cs_vec_t cet_cs_vec_ansi_x3_4_1968 = /* defined in cet.h */ cet_cs_name_ansi_x3_4_1968, /* name of character set */ cet_cs_alias_ansi_x3_4_1968, /* alias table */ - NULL, /* ... to UCS-4 converter (multi-byte) */ - NULL, /* UCS-4 to ... converter (multi-byte) */ + NULL, /* fallback character set */ + NULL, /* unused */ cet_ucs4_map_ansi_x3_4_1968, /* char to UCS-4 value table */ cet_ucs4_ofs_ansi_x3_4_1968, /* first non standard character */ -- 2.30.2